{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 翻页：参数字典的拆解\n",
    "## xpath解析翻页a/@href"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "metadata": {},
   "outputs": [],
   "source": [
    "from requests_html import HTMLSession\n",
    "from urllib.parse import urlparse, parse_qs\n",
    "import pandas as pd\n",
    "session =HTMLSession()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[]\n",
      "{}\n"
     ]
    }
   ],
   "source": [
    "# A-1  xpath 解析翻页a/@href\n",
    "xpath_翻页a = '//div[@class=\"pagerbar\"]/a' # 有disabled, current等href是javascript\n",
    "xpath_翻页a = '//div[@class=\"pagerbar\"]/a[starts-with(@href,\"/zhaopin\")]'\n",
    "print (r.html.xpath(xpath_翻页a)) # 物件\n",
    "\n",
    "href_列表 = [x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)]\n",
    "#print (href_列表)\n",
    "\n",
    "文字_列表 = [x.text for x in r.html.xpath(xpath_翻页a)]\n",
    "#print (文字_列表)\n",
    "\n",
    "href_字典 = {x.text:x.xpath('//@href')[0]  for x in r.html.xpath(xpath_翻页a)}\n",
    "print (href_字典)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "ename": "NameError",
     "evalue": "name '公司数据选择器链结' is not defined",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mNameError\u001b[0m                                 Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-41-f883ec50b9b3>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[0;32m      9\u001b[0m \u001b[1;31m# 上周B-2 使用 pd.DataFrame进行 unuinque()相异值计量比对\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     10\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mpandas\u001b[0m \u001b[1;32mas\u001b[0m \u001b[0mpd\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 11\u001b[1;33m \u001b[0mdf\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mDataFrame\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m[\u001b[0m \u001b[0murlparse\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mx\u001b[0m\u001b[1;33m)\u001b[0m \u001b[1;32mfor\u001b[0m \u001b[0mx\u001b[0m \u001b[1;32min\u001b[0m \u001b[0m公司数据选择器链结\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mvalues\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     12\u001b[0m \u001b[0mprint\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mnunique\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     13\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;31mNameError\u001b[0m: name '公司数据选择器链结' is not defined"
     ]
    }
   ],
   "source": [
    "## 建构参数模板\n",
    "\n",
    "# ```python\n",
    "\n",
    "# 上周B-1 使用 urllib.parse 解析\n",
    "from urllib.parse import urlparse, parse_qs\n",
    "\n",
    "\n",
    "# 上周B-2 使用 pd.DataFrame进行 unuinque()相异值计量比对 \n",
    "import pandas as pd\n",
    "df = pd.DataFrame([ urlparse(x) for x in 公司数据选择器链结.values()])\n",
    "print(df.nunique())\n",
    "\n",
    "# 上周B-3 针对query 再解析之 \n",
    "#df_qs = pd.DataFrame([ parse_qs(x) for x in df['query'] ])\n",
    "df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "print(df.nunique())\n",
    "\n",
    "# 上周B-4 建构 参数模板 及 字典_compTag\n",
    "def parse_url_qs_for_compTag (url):\n",
    "    six_parts = urlparse(url) \n",
    "    out = parse_qs(six_parts.query)\n",
    "    return (out)\n",
    "\n",
    "# parse_url_qs_for_compTag(list(公司数据选择器链结.values())[0])['compTag']\n",
    "参数模板 = parse_url_qs_for_compTag(list(公司数据选择器链结.values())[0])\n",
    "print(参数模板)\n",
    "# [ parse_url_qs_for_compTag(x)['compTag'] for x in 公司数据选择器链结.values()]\n",
    "[ parse_url_qs_for_compTag(x)['compTag'][0] for x in 公司数据选择器链结.values()]\n",
    "\n",
    "字典_compTag = { k:parse_url_qs_for_compTag(v)['compTag'][0] for k,v in 公司数据选择器链结.items()}\n",
    "print (字典_compTag)\n",
    "\n",
    "# B-5 建构 参数模板  \n",
    "def 参数模板生成(compTag , keyword ):\n",
    "    参数 = 参数模板.copy()\n",
    "    参数['compTag'] = compTag\n",
    "    参数['keyword'] = keyword\n",
    "    return (参数)\n",
    "\n",
    "参数_compTag_用户体验 = { k:参数模板生成(compTag = [v], keyword = ['用户体验']) for k,v in 字典_compTag.items()}\n",
    "print(参数_compTag_用户体验)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "metadata": {},
   "outputs": [],
   "source": [
    "from requests_html import HTMLSession\n",
    "from urllib.parse import urlparse, parse_qs\n",
    "import pprint\n",
    "import time,datetime\n",
    "import pandas as pd\n",
    "session =HTMLSession()\n",
    "payload={\n",
    "    'type':2,\n",
    "    'query':'python'\n",
    "}\n",
    "url=\"https://weixin.sogou.com/weixin\"\n",
    "r = session.get(url,params=payload)\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "ename": "KeyError",
     "evalue": "'query'",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mKeyError\u001b[0m                                  Traceback (most recent call last)",
      "\u001b[1;32m~\\Anaconda3\\lib\\site-packages\\pandas\\core\\indexes\\base.py\u001b[0m in \u001b[0;36mget_loc\u001b[1;34m(self, key, method, tolerance)\u001b[0m\n\u001b[0;32m   2645\u001b[0m             \u001b[1;32mtry\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 2646\u001b[1;33m                 \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_engine\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget_loc\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m   2647\u001b[0m             \u001b[1;32mexcept\u001b[0m \u001b[0mKeyError\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\index.pyx\u001b[0m in \u001b[0;36mpandas._libs.index.IndexEngine.get_loc\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\index.pyx\u001b[0m in \u001b[0;36mpandas._libs.index.IndexEngine.get_loc\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\hashtable_class_helper.pxi\u001b[0m in \u001b[0;36mpandas._libs.hashtable.PyObjectHashTable.get_item\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\hashtable_class_helper.pxi\u001b[0m in \u001b[0;36mpandas._libs.hashtable.PyObjectHashTable.get_item\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;31mKeyError\u001b[0m: 'query'",
      "\nDuring handling of the above exception, another exception occurred:\n",
      "\u001b[1;31mKeyError\u001b[0m                                  Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-35-db545ccb7150>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[0;32m     10\u001b[0m \u001b[1;31m# urlparse 解析后丢入数据框\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     11\u001b[0m \u001b[0mdf\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mDataFrame\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m[\u001b[0m \u001b[0murlparse\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mx\u001b[0m\u001b[1;33m)\u001b[0m \u001b[1;32mfor\u001b[0m \u001b[0mx\u001b[0m \u001b[1;32min\u001b[0m \u001b[0mhref_列表\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 12\u001b[1;33m \u001b[0mdf_qs\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mDataFrame\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;33m{\u001b[0m\u001b[0mk\u001b[0m\u001b[1;33m:\u001b[0m\u001b[0mv\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;32mfor\u001b[0m \u001b[0mk\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mv\u001b[0m \u001b[1;32min\u001b[0m \u001b[0mparse_qs\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mx\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m}\u001b[0m \u001b[1;32mfor\u001b[0m \u001b[0mx\u001b[0m \u001b[1;32min\u001b[0m \u001b[0mdf\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;34m'query'\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;33m]\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     13\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     14\u001b[0m \u001b[0mdisplay\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdf\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32m~\\Anaconda3\\lib\\site-packages\\pandas\\core\\frame.py\u001b[0m in \u001b[0;36m__getitem__\u001b[1;34m(self, key)\u001b[0m\n\u001b[0;32m   2798\u001b[0m             \u001b[1;32mif\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcolumns\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mnlevels\u001b[0m \u001b[1;33m>\u001b[0m \u001b[1;36m1\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   2799\u001b[0m                 \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_getitem_multilevel\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 2800\u001b[1;33m             \u001b[0mindexer\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcolumns\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget_loc\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m   2801\u001b[0m             \u001b[1;32mif\u001b[0m \u001b[0mis_integer\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mindexer\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   2802\u001b[0m                 \u001b[0mindexer\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;33m[\u001b[0m\u001b[0mindexer\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32m~\\Anaconda3\\lib\\site-packages\\pandas\\core\\indexes\\base.py\u001b[0m in \u001b[0;36mget_loc\u001b[1;34m(self, key, method, tolerance)\u001b[0m\n\u001b[0;32m   2646\u001b[0m                 \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_engine\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget_loc\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   2647\u001b[0m             \u001b[1;32mexcept\u001b[0m \u001b[0mKeyError\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 2648\u001b[1;33m                 \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_engine\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget_loc\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_maybe_cast_indexer\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m   2649\u001b[0m         \u001b[0mindexer\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget_indexer\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mkey\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mmethod\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mmethod\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mtolerance\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mtolerance\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   2650\u001b[0m         \u001b[1;32mif\u001b[0m \u001b[0mindexer\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mndim\u001b[0m \u001b[1;33m>\u001b[0m \u001b[1;36m1\u001b[0m \u001b[1;32mor\u001b[0m \u001b[0mindexer\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msize\u001b[0m \u001b[1;33m>\u001b[0m \u001b[1;36m1\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\index.pyx\u001b[0m in \u001b[0;36mpandas._libs.index.IndexEngine.get_loc\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\index.pyx\u001b[0m in \u001b[0;36mpandas._libs.index.IndexEngine.get_loc\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\hashtable_class_helper.pxi\u001b[0m in \u001b[0;36mpandas._libs.hashtable.PyObjectHashTable.get_item\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\hashtable_class_helper.pxi\u001b[0m in \u001b[0;36mpandas._libs.hashtable.PyObjectHashTable.get_item\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;31mKeyError\u001b[0m: 'query'"
     ]
    }
   ],
   "source": [
    "# A-2 建构参数模板：找到关键参数及参数结构\n",
    "\n",
    "# 需要模组库\n",
    "from urllib.parse import urlparse, parse_qs\n",
    "import pandas as pd\n",
    "from IPython.display import display, HTML\n",
    "\n",
    "# 总体目标：输入 href_列表, 建构出参数字典\n",
    "\n",
    "# urlparse 解析后丢入数据框\n",
    "df = pd.DataFrame([ urlparse(x) for x in href_列表])\n",
    "df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "\n",
    "display(df)\n",
    "print(df.nunique())\n",
    "display(df_qs)\n",
    "print(df_qs.nunique())\n",
    "\n",
    "df_qs.curPage\n",
    "df_qs = df_qs.assign (curPage_int=df_qs.curPage.astype(int)) # 变成整数"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def parse_url_qs_for_curPage (url):\n",
    "    six_parts = urlparse(url) \n",
    "    out = parse_qs(six_parts.query)\n",
    "    return (out)\n",
    "\n",
    "# 取一例做模板\n",
    "参数模板 = parse_url_qs_for_curPage(href_列表[0])\n",
    "print (参数模板)\n",
    "\n",
    "print (href_字典)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 上周C-1B-5 建构 参数模板  \n",
    "参数_compTag_用户体验 = {'中国500强': {'init': ['-1'], 'headckid': ['58d828c357a8cb19'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'keyword': ['用户体验'], 'compTag': ['155'], 'ckid': ['58d828c357a8cb19'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6aa779111c1b4ca77cff3648d9dee049'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6aa779111c1b4ca77cff3648d9dee049']}, '2018互联网300强': {'init': ['-1'], 'headckid': ['58d828c357a8cb19'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'keyword': ['用户体验'], 'compTag': ['182'], 'ckid': ['58d828c357a8cb19'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6aa779111c1b4ca77cff3648d9dee049'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6aa779111c1b4ca77cff3648d9dee049']}, '制造业500强': {'init': ['-1'], 'headckid': ['58d828c357a8cb19'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'keyword': ['用户体验'], 'compTag': ['186'], 'ckid': ['58d828c357a8cb19'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6aa779111c1b4ca77cff3648d9dee049'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6aa779111c1b4ca77cff3648d9dee049']}, 'AI创新成长50强 ': {'init': ['-1'], 'headckid': ['58d828c357a8cb19'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'keyword': ['用户体验'], 'compTag': ['189'], 'ckid': ['58d828c357a8cb19'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6aa779111c1b4ca77cff3648d9dee049'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6aa779111c1b4ca77cff3648d9dee049']}, '独角兽': {'init': ['-1'], 'headckid': ['58d828c357a8cb19'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'keyword': ['用户体验'], 'compTag': ['130'], 'ckid': ['58d828c357a8cb19'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6aa779111c1b4ca77cff3648d9dee049'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6aa779111c1b4ca77cff3648d9dee049']}, '上市公司': {'init': ['-1'], 'headckid': ['58d828c357a8cb19'], 'flushckid': ['1'], 'fromSearchBtn': ['2'], 'keyword': ['用户体验'], 'compTag': ['156'], 'ckid': ['58d828c357a8cb19'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6aa779111c1b4ca77cff3648d9dee049'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6aa779111c1b4ca77cff3648d9dee049']}}\n",
    "参数_compTag_行业_用户体验 = { }\n",
    "# 上周C-1   多个页面准备测试1 中国500强\n",
    "url = \"https://www.liepin.com/zhaopin/\"\n",
    "session = HTMLSession()\n",
    "payload = 参数_compTag_用户体验['中国500强']\n",
    "r = session.get( url, params = payload)\n",
    "\n",
    "# r.url\n",
    "\n",
    "# 上周C-2  简化 A-1   单一页面爬+解析\n",
    "session = HTMLSession()\n",
    "\n",
    "def requests_liepin( url, params):\n",
    "    r = session.get( url , params = payload)\n",
    "\n",
    "    # 先取特定元素, 精准打击其子后辈\n",
    "    主要元素 = r.html.xpath( '//ul[@class=\"sojob-list\"]/li')\n",
    "\n",
    "    # 作为xpath字典，键为我要抓的牛肉名称，值为xpath\n",
    "    dict_xpaths={ \n",
    "        'text': {\n",
    "            'edu':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]',\n",
    "            '经验':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]/following-sibling::span',\n",
    "            '薪水':    '//div[contains(@class,\"job-info\")]/p/span[@class=\"text-warning\"]', \n",
    "            '时间':    '//div[contains(@class,\"job-info\")]/p/time/@title', \n",
    "            '职称':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '公司地点': '//div[contains(@class,\"job-info\")]/p/a',\n",
    "            '公司名称': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        },\n",
    "        'text_content': {\n",
    "        },\n",
    "        'href': {\n",
    "            '链结':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '公司URL': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        }\n",
    "    }\n",
    "\n",
    "    def get_e_text_content(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [e.xpath(_xpath_)[0].lxml.text_content() for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_text(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [\"\".join([x.strip() if type(x) is str else x.text.strip() for x in e.xpath(_xpath_)]) for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_href(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [list(e.xpath(_xpath_, first=True).absolute_links)[0] \\\n",
    "                   if len(e.xpath(_xpath_, first=True).absolute_links) >= 1  \\\n",
    "                   else \"\" for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    # 只对主要元素下进行.xpath取值\n",
    "    数据字典 = dict()\n",
    "\n",
    "    数据字典 = {k:get_e_text_content(v) for k,v in dict_xpaths['text_content'].items()}\n",
    "    数据字典.update({k:get_e_text(v) for k,v in dict_xpaths['text'].items()})\n",
    "    数据字典.update({k:get_e_href(v) for k,v in dict_xpaths['href'].items()})\n",
    "\n",
    "    数据 = pd.DataFrame(数据字典)\n",
    "    #数据.to_excel(\"20春_Web数据挖掘_week03_liepin.xlsx\", sheet_name=\"搜查结果\")\n",
    "    return (数据)\n",
    "\n",
    "\n",
    "# 上周C-3   多个页面\n",
    "url = \"https://www.liepin.com/zhaopin/\"\n",
    "\n",
    "list_df = list()\n",
    "for k,v in 参数_compTag_用户体验.items():\n",
    "    payload = v\n",
    "    df = requests_liepin( url, params = payload)\n",
    "    df = df.assign (热门公司类型 = k)    \n",
    "    list_df.append(df)\n",
    "\n",
    "df_all = pd.concat(list_df)\n",
    "df_all\n",
    "\n",
    "# 上周C-4   输出\n",
    "df_all.to_excel(\"20春_Web数据挖掘_week03_liepin_各热门公司类型.xlsx\", sheet_name=\"搜查结果\")\n",
    "\n",
    "# 上周C-5 Pandas  基本能力\n",
    "\n",
    "print (df_all.nunique())\n",
    "df_all[['edu']].drop_duplicates()\n",
    "\n",
    "df_all.groupby(['公司名称','edu']).agg({\"职称\":\"count\"}).sort_values(by='职称', ascending=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# B-1 上周C-2  简化 上上周A-1   单一页面爬+解析\n",
    "session = HTMLSession()\n",
    "\n",
    "def requests_liepin( url, params):\n",
    "    r = session.get( url , params = payload)\n",
    "\n",
    "    # 先取特定元素, 精准打击其子后辈\n",
    "    主要元素 = r.html.xpath( '//ul[@class=\"sojob-list\"]/li')\n",
    "\n",
    "    # 作为xpath字典，键为我要抓的牛肉名称，值为xpath\n",
    "    dict_xpaths={ \n",
    "        'text': {\n",
    "            'edu':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]',\n",
    "            '经验':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]/following-sibling::span',\n",
    "            '薪水':    '//div[contains(@class,\"job-info\")]/p/span[@class=\"text-warning\"]', \n",
    "            '时间':    '//div[contains(@class,\"job-info\")]/p/time/@title', \n",
    "            '职称':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '公司地点': '//div[contains(@class,\"job-info\")]/p/a',\n",
    "            '公司名称': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        },\n",
    "        'text_content': {\n",
    "        },\n",
    "        'href': {\n",
    "            '链结':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '公司URL': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        }\n",
    "    }\n",
    "\n",
    "    def get_e_text_content(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [e.xpath(_xpath_)[0].lxml.text_content() for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_text(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [\"\".join([x.strip() if type(x) is str else x.text.strip() for x in e.xpath(_xpath_)]) for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_href(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [list(e.xpath(_xpath_, first=True).absolute_links)[0] \\\n",
    "                   if len(e.xpath(_xpath_, first=True).absolute_links) >= 1  \\\n",
    "                   else \"\" for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    # 只对主要元素下进行.xpath取值\n",
    "    数据字典 = dict()\n",
    "\n",
    "    数据字典 = {k:get_e_text_content(v) for k,v in dict_xpaths['text_content'].items()}\n",
    "    数据字典.update({k:get_e_text(v) for k,v in dict_xpaths['text'].items()})\n",
    "    数据字典.update({k:get_e_href(v) for k,v in dict_xpaths['href'].items()})\n",
    "\n",
    "    数据 = pd.DataFrame(数据字典)\n",
    "    #数据.to_excel(\"20春_Web数据挖掘_week03_liepin.xlsx\", sheet_name=\"搜查结果\")\n",
    "    return (数据)\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 爬亦有道- 不要爬太快\n",
    "time.sleep"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%%time\n",
    "time.sleep(3+4*random())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# B-2 多个页面，但放慢脚步 time.sleep\n",
    "%%time\n",
    "\n",
    "import time\n",
    "from random import random\n",
    "\n",
    "url = \"https://www.liepin.com/zhaopin/\"\n",
    "\n",
    "list_df = list()\n",
    "for k,v in 参数_keyword_用户体验_curPage.items():\n",
    "    payload = v\n",
    "    df = requests_liepin( url, params = payload)\n",
    "    time.sleep(3+4*random())  #放慢脚步 3-7秒, 平均约5秒\n",
    "    df = df.assign (curPage = k)  # 区分  curPage\n",
    "    list_df.append(df)\n",
    "\n",
    "df_all = pd.concat(list_df).reset_index()\n",
    "df_all.index.name = '序'\n",
    "\n",
    "# 上周C-4   输出\n",
    "df_all.to_excel(\"20春_Web数据挖掘_week04_liepin_翻页.xlsx\",\\\n",
    "                sheet_name=\"用户体验\")\n",
    "\n",
    "# 预估时间: 5秒*10 =50\n",
    "# 预估数量: 40*10 =400"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%%time\n",
    "# B-3 多个页面+多个关键词\n",
    "import time\n",
    "from random import random\n",
    "\n",
    "url = \"https://www.liepin.com/zhaopin/\"\n",
    "xpath_翻页a = '//div[@class=\"pagerbar\"]/a[starts-with(@href,\"/zhaopin\")]'\n",
    "\n",
    "keywords = ['用户体验','UX']\n",
    "list_df = list()\n",
    "\n",
    "## 第一页试探有多长的页面\n",
    "for key in keywords:\n",
    "    payload = 参数模板生成(keyword=[key], curPage=['0'])\n",
    "    df = requests_liepin( url, params = payload)\n",
    "    href_列表 = [x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)]\n",
    "    df = pd.DataFrame([ urlparse(x) for x in href_列表])\n",
    "    df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "    df_qs = df_qs.assign (curPage_int=df_qs.curPage.astype(int)) # 变成整数\n",
    "    长度 = df_qs.curPage_int.max()+1\n",
    "    参数_keyword_X_curPage = { \n",
    "        i:参数模板生成(curPage = [i], \\\n",
    "                      keyword = [key]) \\\n",
    "        for i in range(0,长度)\\\n",
    "        }\n",
    "    #print (参数_keyword_X_curPage)\n",
    "    print (key,长度)\n",
    "    \n",
    "    for k,v in 参数_keyword_X_curPage.items():\n",
    "        payload = v\n",
    "        df = requests_liepin( url, params = payload)\n",
    "        time.sleep(3+4*random())  #放慢脚步 3-7秒, 平均约5秒\n",
    "        df = df.assign (keyword = key)  # 区分  keyword    \n",
    "        df = df.assign (curPage = k)  # 区分  curPage    \n",
    "        list_df.append(df)\n",
    "        \n",
    "df_all = pd.concat(list_df).reset_index()\n",
    "df_all.index.name = '序'\n",
    "\n",
    "df_all.to_excel(\"20春_Web数据挖掘_week04_liepin_翻页.xlsx\",\\\n",
    "                sheet_name=\"_\".join(keywords))\n",
    "# 预估时间: 2*5秒*10 =100\n",
    "# 预估数量: 2*40*10 =800"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 翻页：数据备份与整合\n",
    "多个页面+多个关键词执行时，若怕中断最好把每一页的df内容备份做中继"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%%time\n",
    "# C-1 多个页面+多个关键词\n",
    "import time\n",
    "from random import random\n",
    "\n",
    "url = \"https://www.liepin.com/zhaopin/\"\n",
    "xpath_翻页a = '//div[@class=\"pagerbar\"]/a[starts-with(@href,\"/zhaopin\")]'\n",
    "\n",
    "keywords = ['用户体验','UX','产品需求','PRD']\n",
    "list_df = list()\n",
    "\n",
    "## 第一页试探有多长的页面\n",
    "for key in keywords:\n",
    "    payload = 参数模板生成(keyword=[key], curPage=['0'])\n",
    "    df = requests_liepin( url, params = payload)\n",
    "    href_列表 = [x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)]\n",
    "    df = pd.DataFrame([ urlparse(x) for x in href_列表])\n",
    "    df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "    df_qs = df_qs.assign (curPage_int=df_qs.curPage.astype(int)) # 变成整数\n",
    "    长度 = df_qs.curPage_int.max()+1\n",
    "    参数_keyword_X_curPage = { \n",
    "        i:参数模板生成(curPage = [i], \\\n",
    "                      keyword = [key]) \\\n",
    "        for i in range(0,长度)\\\n",
    "        }\n",
    "    #print (参数_keyword_X_curPage)\n",
    "    print (key,长度)\n",
    "    \n",
    "    for k,v in 参数_keyword_X_curPage.items():\n",
    "        payload = v\n",
    "        df = requests_liepin( url, params = payload)\n",
    "        time.sleep(3+4*random())  #放慢脚步 3-7秒, 平均约5秒\n",
    "        ## 备份\n",
    "        df.to_csv(\"20春_Web数据挖掘_week04_liepin_{key}_{k}.tsv\"\\\n",
    "                  .format(key=key, k=k), sep=\"\\t\", encoding=\"utf8\")\n",
    "        \n",
    "        df = df.assign (keyword = key)  # 区分  keyword    \n",
    "        df = df.assign (curPage = k)  # 区分  curPage    \n",
    "        list_df.append(df)\n",
    "        \n",
    "df_all = pd.concat(list_df).reset_index()\n",
    "df_all.index.name = '序'\n",
    "\n",
    "df_all.to_excel(\"20春_Web数据挖掘_week04_liepin_翻页_4.xlsx\",\\\n",
    "                sheet_name=\"_\".join(keywords))\n",
    "# 预估时间: 4*5秒*10 =200\n",
    "# 预估数量: 4*40*10 =1600"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 练习"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 构建行业字典"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 方法一"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'互联网/电商': '/zhaopin/?subIndustry=&init=-1&industryType=industry_01&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=040&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '游戏产业': '/zhaopin/?subIndustry=&init=-1&industryType=industry_01&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=420&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '计算机软件': '/zhaopin/?subIndustry=&init=-1&industryType=industry_01&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=010&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " 'IT服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_01&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=030&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '电子/芯片/半导体': '/zhaopin/?subIndustry=&init=-1&industryType=industry_02&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=050&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '通信业': '/zhaopin/?subIndustry=&init=-1&industryType=industry_02&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=060&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '计算机/网络设备': '/zhaopin/?subIndustry=&init=-1&industryType=industry_02&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=020&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '房地产/建筑': '/zhaopin/?subIndustry=&init=-1&industryType=industry_03&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=080&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '规划/设计/装潢': '/zhaopin/?subIndustry=&init=-1&industryType=industry_03&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=100&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '房地产服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_03&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=090&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '银行': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=130&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '保险': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=140&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '基金/证券/投资': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=150&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '会计/审计': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=430&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '信托/担保/拍卖': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=500&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '快消品': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=190&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '批发零售': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=240&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '服装纺织': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=200&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '家具/家电': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=210&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '办公设备': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=220&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '奢侈品/收藏品': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=460&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '珠宝/玩具/工艺品': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=470&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '汽车/摩托车': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=350&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '机械/机电/重工': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=360&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '印刷/包装/造纸': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=180&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '原材料加工': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=370&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '仪器/电气/自动化': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=340&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '制药/生物工程': '/zhaopin/?subIndustry=&init=-1&industryType=industry_10&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=270&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '医疗/保健/美容': '/zhaopin/?subIndustry=&init=-1&industryType=industry_10&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=280&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '医疗器械': '/zhaopin/?subIndustry=&init=-1&industryType=industry_10&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=290&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '能源/水利': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=330&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '石油/化工': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=310&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '采掘/冶炼/矿产': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=320&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '环保': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=300&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '新能源': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=490&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '专业服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=120&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '中介服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=110&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '外包服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=440&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '检测/认证': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=450&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '餐饮/酒旅/服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=230&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '文体娱乐': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=260&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '租赁服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=510&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '广告/市场/会展': '/zhaopin/?subIndustry=&init=-1&industryType=industry_08&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=070&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '影视文化': '/zhaopin/?subIndustry=&init=-1&industryType=industry_08&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=170&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '教育培训': '/zhaopin/?subIndustry=&init=-1&industryType=industry_08&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=380&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '交通/物流/运输': '/zhaopin/?subIndustry=&init=-1&industryType=industry_09&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=250&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '贸易/进出口': '/zhaopin/?subIndustry=&init=-1&industryType=industry_09&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=160&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '航空/航天': '/zhaopin/?subIndustry=&init=-1&industryType=industry_09&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=480&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '政务/公共服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_12&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=390&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '农林牧渔': '/zhaopin/?subIndustry=&init=-1&industryType=industry_12&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=410&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '其他行业': '/zhaopin/?subIndustry=&init=-1&industryType=industry_12&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=400&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473'}"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from requests_html import HTMLSession\n",
    "session =HTMLSession()\n",
    "url=\"https://www.liepin.com/zhaopin/\"\n",
    "r=session.get(url)\n",
    "行业细分=r.html.xpath(\"//div[@class='sub-industry']/a\")\n",
    "#行业细分\n",
    "行业字典={a.xpath(\"a/text()\")[0]:a.xpath(\"a/@href\")[0]for a in 行业细分}\n",
    "行业字典\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 方法二"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'互联网/电商': '/zhaopin/?subIndustry=&init=-1&industryType=industry_01&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=040&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '游戏产业': '/zhaopin/?subIndustry=&init=-1&industryType=industry_01&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=420&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '计算机软件': '/zhaopin/?subIndustry=&init=-1&industryType=industry_01&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=010&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " 'IT服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_01&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=030&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '电子/芯片/半导体': '/zhaopin/?subIndustry=&init=-1&industryType=industry_02&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=050&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '通信业': '/zhaopin/?subIndustry=&init=-1&industryType=industry_02&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=060&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '计算机/网络设备': '/zhaopin/?subIndustry=&init=-1&industryType=industry_02&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=020&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '房地产/建筑': '/zhaopin/?subIndustry=&init=-1&industryType=industry_03&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=080&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '规划/设计/装潢': '/zhaopin/?subIndustry=&init=-1&industryType=industry_03&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=100&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '房地产服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_03&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=090&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '银行': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=130&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '保险': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=140&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '基金/证券/投资': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=150&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '会计/审计': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=430&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '信托/担保/拍卖': '/zhaopin/?subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=500&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '快消品': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=190&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '批发零售': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=240&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '服装纺织': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=200&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '家具/家电': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=210&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '办公设备': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=220&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '奢侈品/收藏品': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=460&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '珠宝/玩具/工艺品': '/zhaopin/?subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=470&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '汽车/摩托车': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=350&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '机械/机电/重工': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=360&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '印刷/包装/造纸': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=180&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '原材料加工': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=370&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '仪器/电气/自动化': '/zhaopin/?subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=340&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '制药/生物工程': '/zhaopin/?subIndustry=&init=-1&industryType=industry_10&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=270&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '医疗/保健/美容': '/zhaopin/?subIndustry=&init=-1&industryType=industry_10&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=280&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '医疗器械': '/zhaopin/?subIndustry=&init=-1&industryType=industry_10&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=290&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '能源/水利': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=330&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '石油/化工': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=310&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '采掘/冶炼/矿产': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=320&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '环保': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=300&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '新能源': '/zhaopin/?subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=490&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '专业服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=120&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '中介服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=110&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '外包服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=440&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '检测/认证': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=450&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '餐饮/酒旅/服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=230&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '文体娱乐': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=260&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '租赁服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=510&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '广告/市场/会展': '/zhaopin/?subIndustry=&init=-1&industryType=industry_08&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=070&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '影视文化': '/zhaopin/?subIndustry=&init=-1&industryType=industry_08&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=170&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '教育培训': '/zhaopin/?subIndustry=&init=-1&industryType=industry_08&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=380&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '交通/物流/运输': '/zhaopin/?subIndustry=&init=-1&industryType=industry_09&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=250&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '贸易/进出口': '/zhaopin/?subIndustry=&init=-1&industryType=industry_09&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=160&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '航空/航天': '/zhaopin/?subIndustry=&init=-1&industryType=industry_09&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=480&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '政务/公共服务': '/zhaopin/?subIndustry=&init=-1&industryType=industry_12&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=390&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '农林牧渔': '/zhaopin/?subIndustry=&init=-1&industryType=industry_12&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=410&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473',\n",
       " '其他行业': '/zhaopin/?subIndustry=&init=-1&industryType=industry_12&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=400&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473'}"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "行业细分2 = r.html.xpath('//div[@data-selector=\"search-conditions\"]')[0] \\\n",
    "                    .xpath('//dt[@class=\"search-title\"]/following-sibling::dd')[1] \\\n",
    "                    .xpath('//div[contains(@class,\"sub-industry\")]/a')\n",
    "行业细分2\n",
    "\n",
    "\n",
    "行业字典2={a.xpath(\"a/text()\")[0]:a.xpath(\"a/@href\")[0]for a in 行业细分2}\n",
    "行业字典2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>scheme</th>\n",
       "      <th>netloc</th>\n",
       "      <th>path</th>\n",
       "      <th>params</th>\n",
       "      <th>query</th>\n",
       "      <th>fragment</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>互联网/电商</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>游戏产业</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>计算机软件</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>IT服务</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>电子/芯片/半导体</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>通信业</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>计算机/网络设备</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>房地产/建筑</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>规划/设计/装潢</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>房地产服务</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>银行</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>保险</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>基金/证券/投资</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>会计/审计</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>信托/担保/拍卖</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>快消品</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>批发零售</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>服装纺织</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>家具/家电</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>办公设备</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>奢侈品/收藏品</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>珠宝/玩具/工艺品</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>汽车/摩托车</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>机械/机电/重工</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>印刷/包装/造纸</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>原材料加工</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>仪器/电气/自动化</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>制药/生物工程</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>医疗/保健/美容</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>医疗器械</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>能源/水利</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>石油/化工</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>采掘/冶炼/矿产</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>环保</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>新能源</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>专业服务</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>中介服务</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>外包服务</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>检测/认证</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>餐饮/酒旅/服务</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>文体娱乐</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>租赁服务</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>广告/市场/会展</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>影视文化</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>教育培训</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>交通/物流/运输</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>贸易/进出口</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>航空/航天</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>政务/公共服务</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>农林牧渔</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>其他行业</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   scheme netloc       path params query fragment\n",
       "0                    互联网/电商                      \n",
       "1                      游戏产业                      \n",
       "2                     计算机软件                      \n",
       "3                      IT服务                      \n",
       "4                 电子/芯片/半导体                      \n",
       "5                       通信业                      \n",
       "6                  计算机/网络设备                      \n",
       "7                    房地产/建筑                      \n",
       "8                  规划/设计/装潢                      \n",
       "9                     房地产服务                      \n",
       "10                       银行                      \n",
       "11                       保险                      \n",
       "12                 基金/证券/投资                      \n",
       "13                    会计/审计                      \n",
       "14                 信托/担保/拍卖                      \n",
       "15                      快消品                      \n",
       "16                     批发零售                      \n",
       "17                     服装纺织                      \n",
       "18                    家具/家电                      \n",
       "19                     办公设备                      \n",
       "20                  奢侈品/收藏品                      \n",
       "21                珠宝/玩具/工艺品                      \n",
       "22                   汽车/摩托车                      \n",
       "23                 机械/机电/重工                      \n",
       "24                 印刷/包装/造纸                      \n",
       "25                    原材料加工                      \n",
       "26                仪器/电气/自动化                      \n",
       "27                  制药/生物工程                      \n",
       "28                 医疗/保健/美容                      \n",
       "29                     医疗器械                      \n",
       "30                    能源/水利                      \n",
       "31                    石油/化工                      \n",
       "32                 采掘/冶炼/矿产                      \n",
       "33                       环保                      \n",
       "34                      新能源                      \n",
       "35                     专业服务                      \n",
       "36                     中介服务                      \n",
       "37                     外包服务                      \n",
       "38                    检测/认证                      \n",
       "39                 餐饮/酒旅/服务                      \n",
       "40                     文体娱乐                      \n",
       "41                     租赁服务                      \n",
       "42                 广告/市场/会展                      \n",
       "43                     影视文化                      \n",
       "44                     教育培训                      \n",
       "45                 交通/物流/运输                      \n",
       "46                   贸易/进出口                      \n",
       "47                    航空/航天                      \n",
       "48                  政务/公共服务                      \n",
       "49                     农林牧渔                      \n",
       "50                     其他行业                      "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "scheme       1\n",
      "netloc       1\n",
      "path        51\n",
      "params       1\n",
      "query        1\n",
      "fragment     1\n",
      "dtype: int64\n"
     ]
    }
   ],
   "source": [
    "from urllib.parse import urlparse, parse_qs\n",
    "import pandas as pd\n",
    "from IPython.display import display, HTML\n",
    "\n",
    "# 总体目标：输入 href_列表, 建构出参数字典\n",
    "\n",
    "# urlparse 解析后丢入数据框\n",
    "df = pd.DataFrame([ urlparse(x) for x in 行业字典])\n",
    "df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "\n",
    "display(df)\n",
    "print(df.nunique())\n",
    "# display(df_qs)\n",
    "# print(df_qs.nunique())\n",
    "\n",
    "# df_qs.curPage\n",
    "# df_qs = df_qs.assign (curPage_int=df_qs.curPage.astype(int)) # 变成整数"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_01&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=040&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_01&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=420&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_01&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=010&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_01&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=030&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_02&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=050&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_02&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=060&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_02&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=020&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_03&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=080&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_03&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=100&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_03&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=090&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=130&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=140&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=150&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=430&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_04&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=500&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=190&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=240&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=200&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=210&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=220&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=460&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_05&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=470&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=350&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=360&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=180&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=370&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_06&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=340&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_10&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=270&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_10&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=280&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_10&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=290&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=330&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=310&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=320&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=300&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_11&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=490&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=120&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=110&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=440&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=450&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=230&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=260&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_07&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=510&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_08&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=070&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_08&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=170&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_08&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=380&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_09&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=250&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_09&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=160&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_09&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=480&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_12&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=390&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_12&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=410&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment=''),\n",
       " ParseResult(scheme='', netloc='', path='/zhaopin/', params='', query='subIndustry=&init=-1&industryType=industry_12&headckid=156b682b67f66e9e&flushckid=1&fromSearchBtn=2&industries=400&ckid=3b69fd701f0c302c&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=e81d0deb459eb2e0788dec6539fd3473&d_curPage=0&d_pageSize=40&d_headId=e81d0deb459eb2e0788dec6539fd3473', fragment='')]"
      ]
     },
     "execution_count": 14,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from urllib.parse import urlparse, parse_qs\n",
    "[ urlparse(x) for x in 行业字典.values()]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<class 'pandas.core.frame.DataFrame'>\n",
      "RangeIndex: 51 entries, 0 to 50\n",
      "Data columns (total 6 columns):\n",
      " #   Column    Non-Null Count  Dtype \n",
      "---  ------    --------------  ----- \n",
      " 0   scheme    51 non-null     object\n",
      " 1   netloc    51 non-null     object\n",
      " 2   path      51 non-null     object\n",
      " 3   params    51 non-null     object\n",
      " 4   query     51 non-null     object\n",
      " 5   fragment  51 non-null     object\n",
      "dtypes: object(6)\n",
      "memory usage: 2.5+ KB\n",
      "scheme       1\n",
      "netloc       1\n",
      "path        51\n",
      "params       1\n",
      "query        1\n",
      "fragment     1\n",
      "dtype: int64\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>scheme</th>\n",
       "      <th>netloc</th>\n",
       "      <th>path</th>\n",
       "      <th>params</th>\n",
       "      <th>query</th>\n",
       "      <th>fragment</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>互联网/电商</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "  scheme netloc    path params query fragment\n",
       "0                互联网/电商                      "
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import pandas as pd\n",
    "df = pd.DataFrame([ urlparse(x)for x in 行业字典])\n",
    "df.info()\n",
    "print(df.nunique())\n",
    "df.head(1)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 构建行业参数模板"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from requests_html import HTMLSession\n",
    "session =HTMLSession()\n",
    "url=\"https://www.liepin.com/zhaopin/\"\n",
    "r=session.get(url)\n",
    "行业细分=r.html.xpath(\"//div[@class='sub-industry']/a\")\n",
    "#行业细分\n",
    "行业字典={a.xpath(\"a/text()\")[0]:a.xpath(\"a/@href\")[0]for a in 行业细分}\n",
    "行业字典"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 构建地区字典"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 方法一"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'全国': '/zhaopin/?init=-1&ckid=79d26aeb692d8afd&headckid=79d26aeb692d8afd&flushckid=1&fromSearchBtn=2&dqs=&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=9dea5cfe13037393337e11ea01efad60&d_curPage=0&d_pageSize=40&d_headId=9dea5cfe13037393337e11ea01efad60',\n",
       " '北京': '/zhaopin/?init=-1&ckid=79d26aeb692d8afd&headckid=79d26aeb692d8afd&flushckid=1&fromSearchBtn=2&dqs=010&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=9dea5cfe13037393337e11ea01efad60&d_curPage=0&d_pageSize=40&d_headId=9dea5cfe13037393337e11ea01efad60',\n",
       " '上海': '/zhaopin/?init=-1&ckid=79d26aeb692d8afd&headckid=79d26aeb692d8afd&flushckid=1&fromSearchBtn=2&dqs=020&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=9dea5cfe13037393337e11ea01efad60&d_curPage=0&d_pageSize=40&d_headId=9dea5cfe13037393337e11ea01efad60',\n",
       " '广州': '/zhaopin/?init=-1&ckid=79d26aeb692d8afd&headckid=79d26aeb692d8afd&flushckid=1&fromSearchBtn=2&dqs=050020&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=9dea5cfe13037393337e11ea01efad60&d_curPage=0&d_pageSize=40&d_headId=9dea5cfe13037393337e11ea01efad60',\n",
       " '深圳': '/zhaopin/?init=-1&ckid=79d26aeb692d8afd&headckid=79d26aeb692d8afd&flushckid=1&fromSearchBtn=2&dqs=050090&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=9dea5cfe13037393337e11ea01efad60&d_curPage=0&d_pageSize=40&d_headId=9dea5cfe13037393337e11ea01efad60',\n",
       " '天津': '/zhaopin/?init=-1&ckid=79d26aeb692d8afd&headckid=79d26aeb692d8afd&flushckid=1&fromSearchBtn=2&dqs=030&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=9dea5cfe13037393337e11ea01efad60&d_curPage=0&d_pageSize=40&d_headId=9dea5cfe13037393337e11ea01efad60',\n",
       " '苏州': '/zhaopin/?init=-1&ckid=79d26aeb692d8afd&headckid=79d26aeb692d8afd&flushckid=1&fromSearchBtn=2&dqs=060080&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=9dea5cfe13037393337e11ea01efad60&d_curPage=0&d_pageSize=40&d_headId=9dea5cfe13037393337e11ea01efad60',\n",
       " '重庆': '/zhaopin/?init=-1&ckid=79d26aeb692d8afd&headckid=79d26aeb692d8afd&flushckid=1&fromSearchBtn=2&dqs=040&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=9dea5cfe13037393337e11ea01efad60&d_curPage=0&d_pageSize=40&d_headId=9dea5cfe13037393337e11ea01efad60',\n",
       " '南京': '/zhaopin/?init=-1&ckid=79d26aeb692d8afd&headckid=79d26aeb692d8afd&flushckid=1&fromSearchBtn=2&dqs=060020&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=9dea5cfe13037393337e11ea01efad60&d_curPage=0&d_pageSize=40&d_headId=9dea5cfe13037393337e11ea01efad60',\n",
       " '杭州': '/zhaopin/?init=-1&ckid=79d26aeb692d8afd&headckid=79d26aeb692d8afd&flushckid=1&fromSearchBtn=2&dqs=070020&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=9dea5cfe13037393337e11ea01efad60&d_curPage=0&d_pageSize=40&d_headId=9dea5cfe13037393337e11ea01efad60',\n",
       " '大连': '/zhaopin/?init=-1&ckid=79d26aeb692d8afd&headckid=79d26aeb692d8afd&flushckid=1&fromSearchBtn=2&dqs=210040&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=9dea5cfe13037393337e11ea01efad60&d_curPage=0&d_pageSize=40&d_headId=9dea5cfe13037393337e11ea01efad60',\n",
       " '成都': '/zhaopin/?init=-1&ckid=79d26aeb692d8afd&headckid=79d26aeb692d8afd&flushckid=1&fromSearchBtn=2&dqs=280020&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=9dea5cfe13037393337e11ea01efad60&d_curPage=0&d_pageSize=40&d_headId=9dea5cfe13037393337e11ea01efad60',\n",
       " '武汉': '/zhaopin/?init=-1&ckid=79d26aeb692d8afd&headckid=79d26aeb692d8afd&flushckid=1&fromSearchBtn=2&dqs=170020&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=9dea5cfe13037393337e11ea01efad60&d_curPage=0&d_pageSize=40&d_headId=9dea5cfe13037393337e11ea01efad60',\n",
       " '其他': 'javascript:;'}"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from requests_html import HTMLSession\n",
    "session =HTMLSession()\n",
    "url=\"https://www.liepin.com/zhaopin/\"\n",
    "r=session.get(url)\n",
    "地区细分=r.html.xpath(\"//div[@class='search-conditions']/dl[3]/dd/a\")\n",
    "#行业细分\n",
    "地区字典={a.xpath(\"a/text()\")[0]:a.xpath(\"a/@href\")[0]for a in 地区细分}\n",
    "地区字典"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 方法二"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "地区细分2 = r.html.xpath('//div[@data-selector=\"search-conditions\"]')[0] \\\n",
    "                  .xpath('//dt[@class=\"search-title\"]/following-sibling::dd')[2] \\\n",
    "                  .xpath('//div[contains(@class,\"active\")]/a/@href')\n",
    "\n",
    "\n",
    "# 地区字典2={a.xpath(\"a/text()\")[0]:a.xpath(\"a/@href\")[0]for a in 地区细分2}\n",
    "# 地区字典2\n",
    "\n",
    "# 地区细分=r.html.xpath(\"//div[@class='search-conditions']/dl[3]/dd/a\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 构建公司字典"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'道通科技': 'https://www.liepin.com/company/8116218/',\n",
       " '五矿证券': 'https://www.liepin.com/company/1050201/',\n",
       " '奥飞': 'https://www.liepin.com/company/7875551/',\n",
       " '贵州天马传媒有限公司': 'https://www.liepin.com/company/5028062/',\n",
       " '上海南芯半导体科技有限公司': 'https://www.liepin.com/company/8903012/',\n",
       " '旭阳置业有限公司': 'https://www.liepin.com/company/9402612/',\n",
       " '广东奥园商业地产集团有限公司': 'https://www.liepin.com/company/8608772/',\n",
       " '你我贷': 'https://www.liepin.com/company/8639190/',\n",
       " '安踏体育': 'https://www.liepin.com/company/7991541/',\n",
       " '沈阳万科企业有限公司': 'https://www.liepin.com/company/9912521/',\n",
       " '好未来': 'https://www.liepin.com/company/922091/',\n",
       " '上海燕谷坊电子商务有限公司': 'https://www.liepin.com/company/9709096/',\n",
       " '亮风台(上海)信息科技有限公司': 'https://www.liepin.com/company/8982963/',\n",
       " '中天建设集团有限公司': 'https://www.liepin.com/company/9165202/',\n",
       " '雅居乐': 'https://www.liepin.com/company/185424/',\n",
       " '张家口大好河山新农业开发有限公司': 'https://www.liepin.com/company/9608547/',\n",
       " '宁波方力集团有限公司': 'https://www.liepin.com/company/7937350/',\n",
       " '乐元素': 'https://www.liepin.com/company/951672/',\n",
       " '国药租赁': 'https://www.liepin.com/company/8351723/',\n",
       " '广州麦匠信息科技有限公司': 'https://www.liepin.com/company/9356817/',\n",
       " '大泰金石基金销售有限公司': 'https://www.liepin.com/company/10249347/',\n",
       " '顺络电子': 'https://www.liepin.com/company/9558662/',\n",
       " '岭南教育': 'https://www.liepin.com/company/8234719/',\n",
       " '纳晶科技股份有限公司': 'https://www.liepin.com/company/7874262/',\n",
       " '恒瑞医药-福建盛迪医药有限公司': 'https://www.liepin.com/company/10100161/',\n",
       " '海伦堡地产集团': 'https://www.liepin.com/company/7021816/',\n",
       " '宁波唐狮网络科技有限公司': 'https://www.liepin.com/company/9327830/',\n",
       " '华润集团信息管理部': 'https://www.liepin.com/company/9249205/',\n",
       " '浙江亚光科技股份有限公司': 'https://www.liepin.com/company/8070606/',\n",
       " '武汉车千线汽车科技有限公司': 'https://www.liepin.com/company/9529920/',\n",
       " '安克创新': 'https://www.liepin.com/company/8733738/',\n",
       " '上海蓝云实业发展有限公司': 'https://www.liepin.com/company/10050545/',\n",
       " '武汉中城悦城房地产开发有限公司': 'https://www.liepin.com/company/9733701/',\n",
       " '上海和荣建筑工程集团有限公司': 'https://www.liepin.com/company/9533420/',\n",
       " '艺朝艺夕教育科技集团有限公司': 'https://www.liepin.com/company/9637807/',\n",
       " '上海延安医药有限公司': 'https://www.liepin.com/company/9270016/',\n",
       " '湖北威马楚通实业集团有限公司': 'https://www.liepin.com/company/8966480/',\n",
       " '深圳市明源软件股份有限公司': 'https://www.liepin.com/company/1682247/',\n",
       " '佛山绿康置业有限公司': 'https://www.liepin.com/company/10015527/'}"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from requests_html import HTMLSession\n",
    "session =HTMLSession()\n",
    "url=\"https://www.liepin.com/zhaopin/\"\n",
    "r=session.get(url)\n",
    "公司细分=r.html.xpath(\"//div[contains(@class,'sojob-item-main')]//p[@class='company-name']/a\")\n",
    "#行业细分\n",
    "公司字典={a.xpath(\"a/text()\")[0]:a.xpath(\"a/@href\")[0]for a in 公司细分}\n",
    "公司字典"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{}"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from requests_html import HTMLSession\n",
    "session =HTMLSession()\n",
    "url=\"https://www.liepin.com/zhaopin/\"\n",
    "r=session.get(url)\n",
    "公司细分=r.html.xpath(\"//div[@class='search-conditions']/dl[2]/dd/a\")\n",
    "#行业细分\n",
    "公司字典={a.xpath(\"a/text()\")[0]:a.xpath(\"a/@href\")[0]for a in 公司细分}\n",
    "公司字典"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 互评數據，不互评代码 参考代码：week03-week04\n",
    "  1.  观察三变量+一关键词的url。\n",
    "  2.  解析url参数，\n",
    "  3.  创建payload模版，\n",
    "  4.  xpath解析页面数据，\n",
    "  5.  翻页（可参考之前翻页参数模版））"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 猎聘网站抓取职位的基本信息函数"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [],
   "source": [
    "def requests_liepin( url, params):\n",
    "    r = session.get( url , params = payload)\n",
    "\n",
    "    # 先取特定元素, 精准打击其子后辈\n",
    "    主要元素 = r.html.xpath( '//ul[@class=\"sojob-list\"]/li')\n",
    "\n",
    "    # 作为xpath字典，键为我要抓的牛肉名称，值为xpath\n",
    "    dict_xpaths={ \n",
    "        'text': {\n",
    "            'edu':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]',\n",
    "            '经验':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]/following-sibling::span',\n",
    "            '薪水':    '//div[contains(@class,\"job-info\")]/p/span[@class=\"text-warning\"]', \n",
    "            '时间':    '//div[contains(@class,\"job-info\")]/p/time/@title', \n",
    "            '职称':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '公司地点': '//div[contains(@class,\"job-info\")]/p/a',\n",
    "            '公司名称': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        },\n",
    "        'text_content': {\n",
    "        },\n",
    "        'href': {\n",
    "            '链结':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '公司URL': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        }\n",
    "    }\n",
    "\n",
    "    def get_e_text_content(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [e.xpath(_xpath_)[0].lxml.text_content() for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_text(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [\"\".join([x.strip() if type(x) is str else x.text.strip() for x in e.xpath(_xpath_)]) for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_href(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [list(e.xpath(_xpath_, first=True).absolute_links)[0] \\\n",
    "                   if len(e.xpath(_xpath_, first=True).absolute_links) >= 1  \\\n",
    "                   else \"\" for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    # 只对主要元素下进行.xpath取值\n",
    "    数据字典 = dict()\n",
    "\n",
    "    数据字典 = {k:get_e_text_content(v) for k,v in dict_xpaths['text_content'].items()}\n",
    "    数据字典.update({k:get_e_text(v) for k,v in dict_xpaths['text'].items()})\n",
    "    数据字典.update({k:get_e_href(v) for k,v in dict_xpaths['href'].items()})\n",
    "\n",
    "    数据 = pd.DataFrame(数据字典)\n",
    "    #数据.to_excel(\"20春_Web数据挖掘_week03_liepin.xlsx\", sheet_name=\"搜查结果\")\n",
    "    return (数据)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 准备好翻页数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{0: {'compIds': ['7983148'],\n",
       "  'key': ['数据挖掘'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['aa4a3ef545437f22'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['a59191c7e9b1b0c8°radeFlag=0'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['591ebc1760fee953b72353bace17e6cc'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['591ebc1760fee953b72353bace17e6cc'],\n",
       "  'curPage': [0]},\n",
       " 1: {'compIds': ['7983148'],\n",
       "  'key': ['数据挖掘'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['aa4a3ef545437f22'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['a59191c7e9b1b0c8°radeFlag=0'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['591ebc1760fee953b72353bace17e6cc'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['591ebc1760fee953b72353bace17e6cc'],\n",
       "  'curPage': [1]}}"
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "url=\"https://www.liepin.com/zhaopin/?isAnalysis=&dqs=&pubTime=&salary=&compIds=7983148&subIndustry=&industryType=&compscale=&key=%E6%95%B0%E6%8D%AE%E5%88%86%E6%9E%90%E5%B8%88&init=-1&searchType=1&headckid=aa4a3ef545437f22&flushckid=1&compkind=&fromSearchBtn=2&sortFlag=15&ckid=aa4a3ef545437f22&jobKind=&industries=&clean_condition=&siTag=bFGQTbwE_AAQSb-u11jrBw%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_prime&d_ckId=591ebc1760fee953b72353bace17e6cc&d_curPage=0&d_pageSize=40&d_headId=591ebc1760fee953b72353bace17e6cc\"\n",
    "r=session.get(url)\n",
    "xpath_翻页a = '//div[@class=\"pagerbar\"]/a[starts-with(@href,\"/zhaopin\")]'\n",
    "翻页url={x.text:x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)}\n",
    "翻页url\n",
    "href_翻页=[x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)]\n",
    "df=pd.DataFrame([urlparse(x) for x in href_翻页 ])\n",
    "df_qs=pd.DataFrame([{ k:v[0] for k,v in parse_qs(x).items()}for x in df['query']])\n",
    "df_qs = df_qs.assign (curPage_int=df_qs.curPage.astype(int)) \n",
    "df_qs\n",
    "长度=int(df_qs.curPage_int.max()+1)\n",
    "def 翻页_参数拆解(url):\n",
    "    sixpart=urlparse(url)\n",
    "    out=parse_qs(sixpart.query)\n",
    "    return out\n",
    "\n",
    "翻页_参数模板=翻页_参数拆解(href_翻页[0])\n",
    "翻页_参数模板\n",
    "def 翻页_参数调整(key,curPage,compIds):\n",
    "    参数=翻页_参数模板.copy()\n",
    "    参数['key']=key\n",
    "    参数['curPage']=curPage\n",
    "    参数['compIds']=compIds\n",
    "    return 参数\n",
    "指定公司_关键词_翻页参数={i:翻页_参数调整(key=['数据挖掘'],compIds=['7983148'],curPage = [i])\n",
    "                                   for i in  range(0,长度)\n",
    "                                  }\n",
    "\n",
    "指定公司_关键词_翻页参数"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{0: {'compIds': ['7983148'],\n",
       "  'key': ['分析'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['aa4a3ef545437f22'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['50b957bdba487186°radeFlag=0'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['591ebc1760fee953b72353bace17e6cc'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['591ebc1760fee953b72353bace17e6cc'],\n",
       "  'curPage': [0]},\n",
       " 1: {'compIds': ['7983148'],\n",
       "  'key': ['分析'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['aa4a3ef545437f22'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['50b957bdba487186°radeFlag=0'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['591ebc1760fee953b72353bace17e6cc'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['591ebc1760fee953b72353bace17e6cc'],\n",
       "  'curPage': [1]}}"
      ]
     },
     "execution_count": 24,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "url=\"https://www.liepin.com/zhaopin/?isAnalysis=&dqs=&pubTime=&salary=&compIds=7983148&subIndustry=&industryType=&compscale=&key=%E6%95%B0%E6%8D%AE%E5%88%86%E6%9E%90%E5%B8%88&init=-1&searchType=1&headckid=aa4a3ef545437f22&flushckid=1&compkind=&fromSearchBtn=2&sortFlag=15&ckid=aa4a3ef545437f22&jobKind=&industries=&clean_condition=&siTag=bFGQTbwE_AAQSb-u11jrBw%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_prime&d_ckId=591ebc1760fee953b72353bace17e6cc&d_curPage=0&d_pageSize=40&d_headId=591ebc1760fee953b72353bace17e6cc\"\n",
    "r=session.get(url)\n",
    "xpath_翻页a = '//div[@class=\"pagerbar\"]/a[starts-with(@href,\"/zhaopin\")]'\n",
    "翻页url={x.text:x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)}\n",
    "翻页url\n",
    "href_翻页=[x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)]\n",
    "df=pd.DataFrame([urlparse(x) for x in href_翻页 ])\n",
    "df_qs=pd.DataFrame([{ k:v[0] for k,v in parse_qs(x).items()}for x in df['query']])\n",
    "df_qs = df_qs.assign (curPage_int=df_qs.curPage.astype(int)) \n",
    "df_qs\n",
    "长度=int(df_qs.curPage_int.max()+1)\n",
    "def 翻页_参数拆解(url):\n",
    "    sixpart=urlparse(url)\n",
    "    out=parse_qs(sixpart.query)\n",
    "    return out\n",
    "\n",
    "翻页_参数模板=翻页_参数拆解(href_翻页[0])\n",
    "翻页_参数模板\n",
    "def 翻页_参数调整(key,curPage,compIds):\n",
    "    参数=翻页_参数模板.copy()\n",
    "    参数['key']=key\n",
    "    参数['curPage']=curPage\n",
    "    参数['compIds']=compIds\n",
    "    return 参数\n",
    "指定公司_关键词_翻页参数={i:翻页_参数调整(key=['分析'],compIds=['7983148'],curPage = [i])\n",
    "                                   for i in  range(0,长度)\n",
    "                                  }\n",
    "\n",
    "指定公司_关键词_翻页参数"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 构建公司模板"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>compIds</th>\n",
       "      <th>key</th>\n",
       "      <th>init</th>\n",
       "      <th>searchType</th>\n",
       "      <th>headckid</th>\n",
       "      <th>flushckid</th>\n",
       "      <th>fromSearchBtn</th>\n",
       "      <th>sortFlag</th>\n",
       "      <th>ckid</th>\n",
       "      <th>siTag</th>\n",
       "      <th>d_sfrom</th>\n",
       "      <th>d_ckId</th>\n",
       "      <th>d_curPage</th>\n",
       "      <th>d_pageSize</th>\n",
       "      <th>d_headId</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>7863078</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>7983148</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>8983822</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>8076624</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>2778803</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>9747025</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>591850</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8089425</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>1072424</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>2036768</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>4787049</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>8640905</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>2174886</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>8537928</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>182339</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>8830801</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>8660469</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>2399664</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>8899712</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>9469266</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>884492</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>2638985</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>8605497</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>8621471</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>8084886</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>5964833</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>8461883</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>9630160</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>10023177</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>7865459</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>9142549</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>12176713</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>2020322</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>3922321</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>7956861</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>20e0c3eb31215c87</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>5405c23ab621d84e2a54c23ff7675734</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "     compIds    key init searchType          headckid flushckid fromSearchBtn  \\\n",
       "0    7863078  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "1    7983148  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "2    8983822  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "3    8076624  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "4    2778803  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "5    9747025  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "6     591850  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "7    8089425  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "8    1072424  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "9    2036768  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "10   4787049  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "11   8640905  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "12   2174886  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "13   8537928  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "14    182339  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "15   8830801  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "16   8660469  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "17   2399664  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "18   8899712  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "19   9469266  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "20    884492  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "21   2638985  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "22   8605497  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "23   8621471  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "24   8084886  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "25   5964833  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "26   8461883  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "27   9630160  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "28  10023177  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "29   7865459  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "30   9142549  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "31  12176713  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "32   2020322  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "33   3922321  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "34   7956861  数据分析师   -1          1  20e0c3eb31215c87         1             2   \n",
       "\n",
       "   sortFlag              ckid                                          siTag  \\\n",
       "0        15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "1        15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "2        15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "3        15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "4        15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "5        15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "6        15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "7        15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "8        15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "9        15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "10       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "11       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "12       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "13       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "14       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "15       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "16       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "17       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "18       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "19       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "20       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "21       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "22       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "23       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "24       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "25       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "26       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "27       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "28       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "29       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "30       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "31       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "32       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "33       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "34       15  20e0c3eb31215c87  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "\n",
       "         d_sfrom                            d_ckId d_curPage d_pageSize  \\\n",
       "0   search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "1   search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "2   search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "3   search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "4   search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "5   search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "6   search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "7   search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "8   search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "9   search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "10  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "11  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "12  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "13  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "14  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "15  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "16  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "17  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "18  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "19  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "20  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "21  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "22  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "23  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "24  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "25  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "26  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "27  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "28  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "29  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "30  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "31  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "32  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "33  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "34  search_prime  5405c23ab621d84e2a54c23ff7675734         0         40   \n",
       "\n",
       "                            d_headId  \n",
       "0   5405c23ab621d84e2a54c23ff7675734  \n",
       "1   5405c23ab621d84e2a54c23ff7675734  \n",
       "2   5405c23ab621d84e2a54c23ff7675734  \n",
       "3   5405c23ab621d84e2a54c23ff7675734  \n",
       "4   5405c23ab621d84e2a54c23ff7675734  \n",
       "5   5405c23ab621d84e2a54c23ff7675734  \n",
       "6   5405c23ab621d84e2a54c23ff7675734  \n",
       "7   5405c23ab621d84e2a54c23ff7675734  \n",
       "8   5405c23ab621d84e2a54c23ff7675734  \n",
       "9   5405c23ab621d84e2a54c23ff7675734  \n",
       "10  5405c23ab621d84e2a54c23ff7675734  \n",
       "11  5405c23ab621d84e2a54c23ff7675734  \n",
       "12  5405c23ab621d84e2a54c23ff7675734  \n",
       "13  5405c23ab621d84e2a54c23ff7675734  \n",
       "14  5405c23ab621d84e2a54c23ff7675734  \n",
       "15  5405c23ab621d84e2a54c23ff7675734  \n",
       "16  5405c23ab621d84e2a54c23ff7675734  \n",
       "17  5405c23ab621d84e2a54c23ff7675734  \n",
       "18  5405c23ab621d84e2a54c23ff7675734  \n",
       "19  5405c23ab621d84e2a54c23ff7675734  \n",
       "20  5405c23ab621d84e2a54c23ff7675734  \n",
       "21  5405c23ab621d84e2a54c23ff7675734  \n",
       "22  5405c23ab621d84e2a54c23ff7675734  \n",
       "23  5405c23ab621d84e2a54c23ff7675734  \n",
       "24  5405c23ab621d84e2a54c23ff7675734  \n",
       "25  5405c23ab621d84e2a54c23ff7675734  \n",
       "26  5405c23ab621d84e2a54c23ff7675734  \n",
       "27  5405c23ab621d84e2a54c23ff7675734  \n",
       "28  5405c23ab621d84e2a54c23ff7675734  \n",
       "29  5405c23ab621d84e2a54c23ff7675734  \n",
       "30  5405c23ab621d84e2a54c23ff7675734  \n",
       "31  5405c23ab621d84e2a54c23ff7675734  \n",
       "32  5405c23ab621d84e2a54c23ff7675734  \n",
       "33  5405c23ab621d84e2a54c23ff7675734  \n",
       "34  5405c23ab621d84e2a54c23ff7675734  "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "{'字节跳动': {'compIds': ['7863078'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '腾讯': {'compIds': ['7983148'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '便利蜂': {'compIds': ['8983822'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '滴滴': {'compIds': ['8076624'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '饿了么': {'compIds': ['2778803'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '京东商城': {'compIds': ['9747025'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '58同城': {'compIds': ['591850'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '北京国富如荷网络科技有限公司': {'compIds': ['8089425'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '阿里巴巴': {'compIds': ['1072424'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '美团点评': {'compIds': ['2036768'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " 'vivo': {'compIds': ['4787049'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '岩心科技': {'compIds': ['8640905'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '小米': {'compIds': ['2174886'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '上海寻梦信息技术有限公司': {'compIds': ['8537928'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '携程': {'compIds': ['182339'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '资采信息': {'compIds': ['8830801'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '捷信消费金融有限公司': {'compIds': ['8660469'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '亚信科技': {'compIds': ['2399664'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '思爱普': {'compIds': ['8899712'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '遨游酒店信息技术(深圳)有限责任公司': {'compIds': ['9469266'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " 'Baidu': {'compIds': ['884492'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " 'Oracle甲骨文': {'compIds': ['2638985'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '北京快手科技有限公司': {'compIds': ['8605497'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '车好多集团': {'compIds': ['8621471'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '美菜': {'compIds': ['8084886'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '网易集团': {'compIds': ['5964833'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '贝壳找房(北京)科技有限公司': {'compIds': ['8461883'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '北京字节跳动网络技术有限公司': {'compIds': ['9630160'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '天津恒程科技有限公司': {'compIds': ['10023177'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '软通动力': {'compIds': ['7865459'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '深圳依时货拉拉科技有限公司': {'compIds': ['9142549'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '猎聘招聘顾问团队': {'compIds': ['12176713'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '唯品会(中国)': {'compIds': ['2020322'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " 'OPPO移动通信': {'compIds': ['3922321'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']},\n",
       " '深圳平安综合金融服务有限公司': {'compIds': ['7956861'],\n",
       "  'key': ['产品经理'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['20e0c3eb31215c87'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['20e0c3eb31215c87'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['5405c23ab621d84e2a54c23ff7675734'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['5405c23ab621d84e2a54c23ff7675734']}}"
      ]
     },
     "execution_count": 25,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from requests_html import HTMLSession\n",
    "from urllib.parse import urlparse, parse_qs\n",
    "session =HTMLSession()\n",
    "url=\"https://www.liepin.com/zhaopin/?industries=&subIndustry=&dqs=&salary=&jobKind=&pubTime=&compkind=&compscale=&industryType=&searchType=1&clean_condition=&isAnalysis=&init=1&sortFlag=15&flushckid=0&fromSearchBtn=1&headckid=a98aae475f67d6d3&d_headId=f46aad599fa2d37a4837e240451ca080&d_ckId=f46aad599fa2d37a4837e240451ca080&d_sfrom=search_unknown&d_curPage=0&d_pageSize=40&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&key=%E6%95%B0%E6%8D%AE%E5%88%86%E6%9E%90%E5%B8%88\"\n",
    "r=session.get(url)\n",
    "指定公司url=r.html.xpath(\"//dd[@class='comp-list']/ul[@class='clearfix']/li/a\")\n",
    "指定公司url\n",
    "公司字典={a.xpath(\"a/span/text()\")[0]:a.xpath(\"a/@href\")[0]for a in 指定公司url}\n",
    "公司字典\n",
    "href_列表 = [x.xpath('a/@href')[0] for x in 指定公司url]\n",
    "href_列表\n",
    "#分解url\n",
    "\n",
    "df= pd.DataFrame([urlparse(x) for x in href_列表])\n",
    "df.nunique()\n",
    "df_qs=pd.DataFrame([{k:v[0]for k,v in parse_qs(x).items()}for x in df['query']])\n",
    "display(df_qs)\n",
    "df_qs.nunique()\n",
    "#compIds 不同\n",
    "#取一例做参数模板\n",
    "def 参数拆解(url):\n",
    "    sixpart=urlparse(url)\n",
    "    out=parse_qs(sixpart.query)\n",
    "    return out\n",
    "\n",
    "参数模板=参数拆解(href_列表[0])\n",
    "参数模板\n",
    "def 参数调整(key,compIds):\n",
    "    参数=参数模板.copy()\n",
    "    参数['key']=key\n",
    "    参数['compIds']=compIds\n",
    "    return 参数\n",
    "公司代号字典={k:参数拆解(v)['compIds'][0]for k,v in 公司字典.items()}\n",
    "公司代号字典\n",
    "\n",
    "修改关键词={k:参数调整(compIds=[v],key=['产品经理'])for k,v in 公司代号字典.items()}\n",
    "修改关键词"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>compIds</th>\n",
       "      <th>key</th>\n",
       "      <th>init</th>\n",
       "      <th>searchType</th>\n",
       "      <th>headckid</th>\n",
       "      <th>flushckid</th>\n",
       "      <th>fromSearchBtn</th>\n",
       "      <th>sortFlag</th>\n",
       "      <th>ckid</th>\n",
       "      <th>siTag</th>\n",
       "      <th>d_sfrom</th>\n",
       "      <th>d_ckId</th>\n",
       "      <th>d_curPage</th>\n",
       "      <th>d_pageSize</th>\n",
       "      <th>d_headId</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>7863078</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>7983148</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>8983822</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>8076624</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>2778803</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>9747025</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>591850</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8089425</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>1072424</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>2036768</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>4787049</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>8640905</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>2174886</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>8537928</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>182339</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>8830801</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>8660469</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>2399664</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>8899712</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>9469266</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>884492</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>2638985</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>8605497</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>8621471</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>8084886</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>5964833</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>8461883</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>9630160</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>10023177</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>7865459</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>9142549</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>12176713</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>2020322</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>3922321</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>7956861</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>-1</td>\n",
       "      <td>1</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>77831e9420db2b54</td>\n",
       "      <td>bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_prime</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>adc64b52aa0898aefcab2e8f6cf70c0e</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "     compIds    key init searchType          headckid flushckid fromSearchBtn  \\\n",
       "0    7863078  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "1    7983148  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "2    8983822  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "3    8076624  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "4    2778803  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "5    9747025  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "6     591850  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "7    8089425  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "8    1072424  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "9    2036768  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "10   4787049  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "11   8640905  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "12   2174886  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "13   8537928  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "14    182339  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "15   8830801  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "16   8660469  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "17   2399664  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "18   8899712  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "19   9469266  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "20    884492  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "21   2638985  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "22   8605497  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "23   8621471  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "24   8084886  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "25   5964833  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "26   8461883  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "27   9630160  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "28  10023177  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "29   7865459  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "30   9142549  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "31  12176713  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "32   2020322  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "33   3922321  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "34   7956861  数据分析师   -1          1  77831e9420db2b54         1             2   \n",
       "\n",
       "   sortFlag              ckid                                          siTag  \\\n",
       "0        15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "1        15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "2        15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "3        15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "4        15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "5        15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "6        15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "7        15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "8        15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "9        15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "10       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "11       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "12       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "13       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "14       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "15       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "16       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "17       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "18       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "19       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "20       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "21       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "22       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "23       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "24       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "25       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "26       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "27       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "28       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "29       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "30       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "31       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "32       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "33       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "34       15  77831e9420db2b54  bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw   \n",
       "\n",
       "         d_sfrom                            d_ckId d_curPage d_pageSize  \\\n",
       "0   search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "1   search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "2   search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "3   search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "4   search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "5   search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "6   search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "7   search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "8   search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "9   search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "10  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "11  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "12  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "13  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "14  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "15  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "16  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "17  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "18  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "19  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "20  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "21  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "22  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "23  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "24  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "25  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "26  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "27  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "28  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "29  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "30  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "31  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "32  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "33  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "34  search_prime  adc64b52aa0898aefcab2e8f6cf70c0e         0         40   \n",
       "\n",
       "                            d_headId  \n",
       "0   adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "1   adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "2   adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "3   adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "4   adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "5   adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "6   adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "7   adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "8   adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "9   adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "10  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "11  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "12  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "13  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "14  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "15  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "16  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "17  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "18  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "19  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "20  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "21  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "22  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "23  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "24  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "25  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "26  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "27  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "28  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "29  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "30  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "31  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "32  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "33  adc64b52aa0898aefcab2e8f6cf70c0e  \n",
       "34  adc64b52aa0898aefcab2e8f6cf70c0e  "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "{'字节跳动': {'compIds': ['7863078'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '腾讯': {'compIds': ['7983148'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '便利蜂': {'compIds': ['8983822'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '滴滴': {'compIds': ['8076624'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '饿了么': {'compIds': ['2778803'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '京东商城': {'compIds': ['9747025'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '58同城': {'compIds': ['591850'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '北京国富如荷网络科技有限公司': {'compIds': ['8089425'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '阿里巴巴': {'compIds': ['1072424'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '美团点评': {'compIds': ['2036768'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " 'vivo': {'compIds': ['4787049'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '岩心科技': {'compIds': ['8640905'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '小米': {'compIds': ['2174886'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '上海寻梦信息技术有限公司': {'compIds': ['8537928'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '携程': {'compIds': ['182339'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '资采信息': {'compIds': ['8830801'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '捷信消费金融有限公司': {'compIds': ['8660469'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '亚信科技': {'compIds': ['2399664'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '思爱普': {'compIds': ['8899712'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '遨游酒店信息技术(深圳)有限责任公司': {'compIds': ['9469266'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " 'Baidu': {'compIds': ['884492'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " 'Oracle甲骨文': {'compIds': ['2638985'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '北京快手科技有限公司': {'compIds': ['8605497'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '车好多集团': {'compIds': ['8621471'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '美菜': {'compIds': ['8084886'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '网易集团': {'compIds': ['5964833'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '贝壳找房(北京)科技有限公司': {'compIds': ['8461883'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '北京字节跳动网络技术有限公司': {'compIds': ['9630160'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '天津恒程科技有限公司': {'compIds': ['10023177'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '软通动力': {'compIds': ['7865459'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '深圳依时货拉拉科技有限公司': {'compIds': ['9142549'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '猎聘招聘顾问团队': {'compIds': ['12176713'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '唯品会(中国)': {'compIds': ['2020322'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " 'OPPO移动通信': {'compIds': ['3922321'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']},\n",
       " '深圳平安综合金融服务有限公司': {'compIds': ['7956861'],\n",
       "  'key': ['前端'],\n",
       "  'init': ['-1'],\n",
       "  'searchType': ['1'],\n",
       "  'headckid': ['77831e9420db2b54'],\n",
       "  'flushckid': ['1'],\n",
       "  'fromSearchBtn': ['2'],\n",
       "  'sortFlag': ['15'],\n",
       "  'ckid': ['77831e9420db2b54'],\n",
       "  'siTag': ['bFGQTbwE_AAQSb-u11jrBw~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_prime'],\n",
       "  'd_ckId': ['adc64b52aa0898aefcab2e8f6cf70c0e'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['adc64b52aa0898aefcab2e8f6cf70c0e']}}"
      ]
     },
     "execution_count": 26,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from requests_html import HTMLSession\n",
    "from urllib.parse import urlparse, parse_qs\n",
    "session =HTMLSession()\n",
    "url=\"https://www.liepin.com/zhaopin/?industries=&subIndustry=&dqs=&salary=&jobKind=&pubTime=&compkind=&compscale=&industryType=&searchType=1&clean_condition=&isAnalysis=&init=1&sortFlag=15&flushckid=0&fromSearchBtn=1&headckid=a98aae475f67d6d3&d_headId=f46aad599fa2d37a4837e240451ca080&d_ckId=f46aad599fa2d37a4837e240451ca080&d_sfrom=search_unknown&d_curPage=0&d_pageSize=40&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&key=%E6%95%B0%E6%8D%AE%E5%88%86%E6%9E%90%E5%B8%88\"\n",
    "r=session.get(url)\n",
    "指定公司url=r.html.xpath(\"//dd[@class='comp-list']/ul[@class='clearfix']/li/a\")\n",
    "指定公司url\n",
    "公司字典={a.xpath(\"a/span/text()\")[0]:a.xpath(\"a/@href\")[0]for a in 指定公司url}\n",
    "公司字典\n",
    "href_列表 = [x.xpath('a/@href')[0] for x in 指定公司url]\n",
    "href_列表\n",
    "#分解url\n",
    "\n",
    "df= pd.DataFrame([urlparse(x) for x in href_列表])\n",
    "df.nunique()\n",
    "df_qs=pd.DataFrame([{k:v[0]for k,v in parse_qs(x).items()}for x in df['query']])\n",
    "display(df_qs)\n",
    "df_qs.nunique()\n",
    "#compIds 不同\n",
    "#取一例做参数模板\n",
    "def 参数拆解(url):\n",
    "    sixpart=urlparse(url)\n",
    "    out=parse_qs(sixpart.query)\n",
    "    return out\n",
    "\n",
    "参数模板=参数拆解(href_列表[0])\n",
    "参数模板\n",
    "def 参数调整(key,compIds):\n",
    "    参数=参数模板.copy()\n",
    "    参数['key']=key\n",
    "    参数['compIds']=compIds\n",
    "    return 参数\n",
    "公司代号字典={k:参数拆解(v)['compIds'][0]for k,v in 公司字典.items()}\n",
    "公司代号字典\n",
    "\n",
    "keyword={k:参数调整(compIds=[v],key=['前端'])for k,v in 公司代号字典.items()}\n",
    "keyword"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [
    {
     "ename": "KeyError",
     "evalue": "'query'",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mKeyError\u001b[0m                                  Traceback (most recent call last)",
      "\u001b[1;32m~\\Anaconda3\\lib\\site-packages\\pandas\\core\\indexes\\base.py\u001b[0m in \u001b[0;36mget_loc\u001b[1;34m(self, key, method, tolerance)\u001b[0m\n\u001b[0;32m   2645\u001b[0m             \u001b[1;32mtry\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 2646\u001b[1;33m                 \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_engine\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget_loc\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m   2647\u001b[0m             \u001b[1;32mexcept\u001b[0m \u001b[0mKeyError\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\index.pyx\u001b[0m in \u001b[0;36mpandas._libs.index.IndexEngine.get_loc\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\index.pyx\u001b[0m in \u001b[0;36mpandas._libs.index.IndexEngine.get_loc\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\hashtable_class_helper.pxi\u001b[0m in \u001b[0;36mpandas._libs.hashtable.PyObjectHashTable.get_item\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\hashtable_class_helper.pxi\u001b[0m in \u001b[0;36mpandas._libs.hashtable.PyObjectHashTable.get_item\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;31mKeyError\u001b[0m: 'query'",
      "\nDuring handling of the above exception, another exception occurred:\n",
      "\u001b[1;31mKeyError\u001b[0m                                  Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-27-61d6ecf367b6>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[0;32m     10\u001b[0m     \u001b[0mhref_列表\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;33m[\u001b[0m\u001b[0mx\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mxpath\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'//@href'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;32mfor\u001b[0m \u001b[0mx\u001b[0m \u001b[1;32min\u001b[0m \u001b[0mr\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mhtml\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mxpath\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mxpath_翻页a\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     11\u001b[0m     \u001b[0mdf\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mDataFrame\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m[\u001b[0m \u001b[0murlparse\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mx\u001b[0m\u001b[1;33m)\u001b[0m \u001b[1;32mfor\u001b[0m \u001b[0mx\u001b[0m \u001b[1;32min\u001b[0m \u001b[0mhref_列表\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 12\u001b[1;33m     \u001b[0mdf_qs\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mDataFrame\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;33m{\u001b[0m\u001b[0mk\u001b[0m\u001b[1;33m:\u001b[0m\u001b[0mv\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;32mfor\u001b[0m \u001b[0mk\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mv\u001b[0m \u001b[1;32min\u001b[0m \u001b[0mparse_qs\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mx\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m}\u001b[0m \u001b[1;32mfor\u001b[0m \u001b[0mx\u001b[0m \u001b[1;32min\u001b[0m \u001b[0mdf\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;34m'query'\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;33m]\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     13\u001b[0m     \u001b[0mdf_qs\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mdf_qs\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0massign\u001b[0m \u001b[1;33m(\u001b[0m\u001b[0mcurPage_int\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mdf_qs\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcurPage\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mastype\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mint\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m \u001b[1;31m# 变成整数\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     14\u001b[0m     \u001b[0m长度\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mdf_qs\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcurPage_int\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mmax\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m+\u001b[0m\u001b[1;36m1\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32m~\\Anaconda3\\lib\\site-packages\\pandas\\core\\frame.py\u001b[0m in \u001b[0;36m__getitem__\u001b[1;34m(self, key)\u001b[0m\n\u001b[0;32m   2798\u001b[0m             \u001b[1;32mif\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcolumns\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mnlevels\u001b[0m \u001b[1;33m>\u001b[0m \u001b[1;36m1\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   2799\u001b[0m                 \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_getitem_multilevel\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 2800\u001b[1;33m             \u001b[0mindexer\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcolumns\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget_loc\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m   2801\u001b[0m             \u001b[1;32mif\u001b[0m \u001b[0mis_integer\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mindexer\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   2802\u001b[0m                 \u001b[0mindexer\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;33m[\u001b[0m\u001b[0mindexer\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32m~\\Anaconda3\\lib\\site-packages\\pandas\\core\\indexes\\base.py\u001b[0m in \u001b[0;36mget_loc\u001b[1;34m(self, key, method, tolerance)\u001b[0m\n\u001b[0;32m   2646\u001b[0m                 \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_engine\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget_loc\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   2647\u001b[0m             \u001b[1;32mexcept\u001b[0m \u001b[0mKeyError\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 2648\u001b[1;33m                 \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_engine\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget_loc\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_maybe_cast_indexer\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m   2649\u001b[0m         \u001b[0mindexer\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget_indexer\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mkey\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mmethod\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mmethod\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mtolerance\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mtolerance\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   2650\u001b[0m         \u001b[1;32mif\u001b[0m \u001b[0mindexer\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mndim\u001b[0m \u001b[1;33m>\u001b[0m \u001b[1;36m1\u001b[0m \u001b[1;32mor\u001b[0m \u001b[0mindexer\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msize\u001b[0m \u001b[1;33m>\u001b[0m \u001b[1;36m1\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\index.pyx\u001b[0m in \u001b[0;36mpandas._libs.index.IndexEngine.get_loc\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\index.pyx\u001b[0m in \u001b[0;36mpandas._libs.index.IndexEngine.get_loc\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\hashtable_class_helper.pxi\u001b[0m in \u001b[0;36mpandas._libs.hashtable.PyObjectHashTable.get_item\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;32mpandas\\_libs\\hashtable_class_helper.pxi\u001b[0m in \u001b[0;36mpandas._libs.hashtable.PyObjectHashTable.get_item\u001b[1;34m()\u001b[0m\n",
      "\u001b[1;31mKeyError\u001b[0m: 'query'"
     ]
    }
   ],
   "source": [
    "import time\n",
    "from random import random\n",
    "from requests_html import HTMLSession\n",
    "session =HTMLSession()\n",
    "url=\"https://www.liepin.com/zhaopin/\"\n",
    "r=session.get(url)\n",
    "keywords = ['用户体验','UX','产品需求','PRD']\n",
    "list_df=list()\n",
    "for key in keywords:\n",
    "    href_列表 = [x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)]\n",
    "    df = pd.DataFrame([ urlparse(x) for x in href_列表])\n",
    "    df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "    df_qs = df_qs.assign (curPage_int=df_qs.curPage.astype(int)) # 变成整数\n",
    "    长度 = df_qs.curPage_int.max()+1\n",
    "    指定公司_关键词_翻页参数={i:翻页_参数调整(key=[key],compIds=['7983148'],curPage = [i])\n",
    "                                   for i in  range(0,长度)\n",
    "                                  } \n",
    "    \n",
    "    #print (参数_keyword_X_curPage)\n",
    "    print (key,长度)\n",
    "    for k,v in  指定公司_关键词_翻页参数.items():\n",
    "        payload = v\n",
    "        df = requests_liepin( url, params = payload)\n",
    "        time.sleep(1+4*random())  #放慢脚步 3-7秒, 平均约5秒\n",
    "        ## 备份\n",
    "#         df.to_csv(\"20春_Web数据挖掘_week04_liepin_{key}_{k}.tsv\"\\\n",
    "#                   .format(key=key, k=k), sep=\"\\t\", encoding=\"utf8\")\n",
    "        \n",
    "        df = df.assign (keyword = key)  # 区分  keyword    \n",
    "        df = df.assign (curPage = k)  # 区分  curPage   \n",
    "        \n",
    "        list_df.append(df)\n",
    "        \n",
    "df_多个关键词爬取 = pd.concat(list_df).reset_index()\n",
    "df_多个关键词爬取.index.name = '序'\n",
    "df_多个关键词爬取\n",
    "#df_all.to_excel(\"20春_Web数据挖掘_week04_liepin_翻页_4.xlsx\",\\\n",
    "#                sheet_name=\"_\".join(keywords))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def 行业参数调整(industryType,industries,key):\n",
    "    参数=行业参数.copy()\n",
    "    参数['industryType']=industryType\n",
    "    参数['industries']=industries\n",
    "    参数['key']=key\n",
    "    return 参数\n",
    "#k:行业参数调整(industryType=['industry_09'],industries=[],\n",
    "行业_keyword=行业参数调整(industryType=['industry_09'],industries=['160'],key=['销售经理'])\n",
    "行业_keyword\n",
    "# 行业_keyword_调整={k:key=['销售经理'])for k,v in 行业代号拆解.items()}\n",
    "# 行业_keyword_调整"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def 翻页_参数拆解(url):\n",
    "        sixpart=urlparse(url)\n",
    "        out=parse_qs(sixpart.query)\n",
    "        return out\n",
    "\n",
    "\n",
    "url =\"https://www.liepin.com/zhaopin/?isAnalysis=&dqs=&pubTime=&salary=&compIds=&subIndustry=&industryType=industry_01&compscale=&key=%E6%95%B0%E6%8D%AE%E5%88%86%E6%9E%90%E5%B8%88&init=-1&searchType=1&headckid=aa4a3ef545437f22&flushckid=1&compkind=&fromSearchBtn=2&sortFlag=15&ckid=8bc9e5a71fd77d33&jobKind=&industries=040&clean_condition=&siTag=bFGQTbwE_AAQSb-u11jrBw%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_prime&d_ckId=591ebc1760fee953b72353bace17e6cc&d_curPage=0&d_pageSize=40&d_headId=591ebc1760fee953b72353bace17e6cc\"\n",
    "def  翻页url(url,industryType,industries,key,curPage_int):\n",
    "    r=session.get(url)\n",
    "    xpath_翻页a = '//div[@class=\"pagerbar\"]/a[starts-with(@href,\"/zhaopin\")]'\n",
    "    翻页url={x.text:x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)}\n",
    "    翻页url\n",
    "    href_翻页=[x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)]\n",
    "    df=pd.DataFrame([urlparse(x) for x in href_翻页 ])\n",
    "    df_qs=pd.DataFrame([{ k:v[0] for k,v in parse_qs(x).items()}for x in df['query']])\n",
    "    df_qs = df_qs.assign (curPage_int=df_qs.curPage.astype(int)) \n",
    "    df_qs\n",
    "    长度=int(df_qs.curPage_int.max()+1)\n",
    "    翻页_参数模板=翻页_参数拆解(href_翻页[0])\n",
    "    参数=翻页_参数模板.copy()\n",
    "    参数['industryType']=industryType\n",
    "    参数['industries']=industries\n",
    "    参数['key']=key\n",
    "    参数['curPage_int']=curPage_int\n",
    "    return 参数\n",
    "# e=翻页url(url,industryType=['industry_01'],industries=['010'],key=['产品经理'])\n",
    "# e\n",
    "翻页_参数={i:翻页url(url,industryType=['industry_01'],industries=['160'],key=['产品经理'],curPage_int = [i]  )\n",
    "               for i in  range(0,长度)\n",
    "      }\n",
    "# # 指定公司_关键词_翻页参数=翻页_参数调整(key=['数据挖掘'],compIds=['7983148'],curPage_int= [i])\n",
    "# #                                    for i in  range(0,长度)\n",
    "# #                                   }\n",
    "翻页_参数"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import time\n",
    "from random import random\n",
    "from requests_html import HTMLSession\n",
    "session =HTMLSession()\n",
    "url=\"https://www.liepin.com/zhaopin/\"\n",
    "r=session.get(url)\n",
    "keywords = ['用户体验','UX','产品需求','PRD']\n",
    "list_df=list()\n",
    "for key in keywords:\n",
    "    翻页_参数={i:翻页url(url,industryType=['industry_01'],industries=['040'],key=[key],curPage_int = [i]  )\n",
    "               for i in  range(0,长度)\n",
    "      }\n",
    "    print (key,长度)\n",
    "    for k,v in  翻页_参数.items():\n",
    "        payload = v\n",
    "        df = requests_liepin( url, params = payload)\n",
    "#         time.sleep(1+4*random())  #放慢脚步 3-7秒, 平均约5秒\n",
    "#         ## 备份\n",
    "#         df.to_csv(\"20春_Web数据挖掘_week04_liepin_{key}_{k}.tsv\"\\\n",
    "#                   .format(key=key, k=k), sep=\"\\t\", encoding=\"utf8\")\n",
    "\n",
    "        df = df.assign (keyword = key)  # 区分  keyword    \n",
    "        df = df.assign (curPage = k)  # 区分  curPage    \n",
    "        list_df.append(df)\n",
    "        \n",
    "df_all = pd.concat(list_df).reset_index()\n",
    "df_all.index.name = '顺序'\n",
    "df_all"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import time\n",
    "from random import random\n",
    "from requests_html import HTMLSession\n",
    "session =HTMLSession()\n",
    "url=\"https://www.liepin.com/zhaopin/\"\n",
    "r=session.get(url)\n",
    "keywords = ['产品经理','运营','新媒体','用户研究','交互','前端','设计','数据分析','PRD','APP','python','可视化']\n",
    "list_df=list()\n",
    "for number in 公司代号字典.values():\n",
    "    href_列表 = [x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)]\n",
    "    df = pd.DataFrame([ urlparse(x) for x in href_列表])\n",
    "    df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "    df_qs = df_qs.assign (curPage_int=df_qs.curPage.astype(int)) # 变成整数\n",
    "    长度 = df_qs.curPage_int.max()+1\n",
    "#     指定公司_关键词_翻页参数={i:翻页_参数调整(key=[key],compIds=[number],curPage = [i])\n",
    "#                                        for i in  range(0,长度)\n",
    "#                                       }\n",
    "#     print (key,number,长度)\n",
    "    for key in keywords:\n",
    "        指定公司_关键词_翻页参数={i:翻页_参数调整(key=[key],compIds=[number],curPage = [i])\n",
    "                                       for i in  range(0,长度)\n",
    "                                      } \n",
    "\n",
    "        #print (参数_keyword_X_curPage)\n",
    "        print (key,number,长度)\n",
    "        for k,v in  指定公司_关键词_翻页参数.items():\n",
    "            payload = v\n",
    "            df = requests_liepin( url, params = payload)\n",
    "            time.sleep(2+8*random())  #放慢脚步 2-10秒, 平均约5秒\n",
    "            ## 备份\n",
    "#             df.to_csv(\"20春_Web数据挖掘_week07_liepin_{key}_{k}.tsv\"\\\n",
    "#                       .format(key=key, k=k), sep=\"\\t\", encoding=\"utf8\")\n",
    "\n",
    "            df = df.assign (keyword = key)  # 区分  keyword    \n",
    "            df = df.assign (curPage = k)  # 区分  curPage    \n",
    "            list_df.append(df)\n",
    "        \n",
    "df_网新 = pd.concat(list_df).reset_index()\n",
    "df_网新.index.name = '顺序'\n",
    "df_网新"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.7"
  },
  "toc": {
   "base_numbering": 1,
   "nav_menu": {},
   "number_sections": true,
   "sideBar": true,
   "skip_h1_title": false,
   "title_cell": "Table of Contents",
   "title_sidebar": "Contents",
   "toc_cell": false,
   "toc_position": {},
   "toc_section_display": true,
   "toc_window_display": false
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
